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} Until ... 
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socket <) -> s f_so eke t (domain, service, protocol) 

if (this is a TCP .socket) { 

if (called for the first time) { 

perform SAN transport initialization; 
Start up SAN Transport; 

fd = socket (domain, service, protocol) 
Note fd of first socket call; 
return ( f d) ; 

} 

else { 

fd = socket (domain, service, protocol) 
return ( f d) ; 

} 

} 

else 

return (socket (domain, service, protocol) 



bind() sf_bind (fd, sockaddr, addrlen) { 

Note IP address & port #; 

if (this is a TCP socket} { 

if {port is specified) 

note fd as service fd for this port; 

return (bind (fd, sockaddr, addrlen)); 



return (bind (fd, sockaddr, addrlen)); 



else 
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connect () ~> sf_connect (fd, sockaddr, addrlen) { 

Note IP address & port #; 

if (this is a TCP socket) { 

if (this is a non-blocking socket) { 

if (CONNECTION_REQUEST msg not previously sent for this fd) 
send CONNECTION__REQUEST msg with fd to proxy node; 

if (ACCEPT_CONNECTI0N or RE JECT_CONNECTION msg is pending) { 

if (receive ACCEPT_CONNECTION msg) { 

assign mapped fd by mapping OS-assigned fd to a transport fd; 

return (success) ; 

} 

else 

return (connection refused error) ; 

} 

else 

return (connection in progress) ; 

□ > 

In 

j|J wait to receive (ACCEPT_CONNECTION or RE JECT_CONNECTION msg) ; 
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else { 

send CONNECT ION_REQUE ST msg with fd to proxy node; 



if (receive ACCEPT_CONNECTION msg) { 
:s f assign mapped fd by mapping OS-assigned fd to a transport fd; 

'^1 return (success) ; 



else 

return (connection refused error) 



else 

return (connect (fd, sockaddr, addrlen)' 
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listen () --> sf_listen (f d, backlog) { 

switch (type of fd) { 

case service fd: 

send JOIN_SERVICE msg; 
return (success) ; 

case mapped fd: 

case transport fd: 

return (exception error) ; 

default: 

return ( listen (fd, backlog)) 
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accept () — > sf_accept (fd, clientaddr, len) { 

switch (type of fd) { 

case service fd: 

if (this is a non-blocking socket) { 

if CONNECTION_REQUEST msg is pending for this service fd { 

read CONNECTION__REQUEST msg with proxy-assigned flow id; 

if (connection can be accepted) { 
send ACCEPT_CONNECTI0N msg; 
return (flow id); 

} 

else { 

send RE JECT_CONNECTION msg; 
return (try again) ; 

} 

} 

else 

return (try again) ; 

} 

else { 



,2 while (1) { 



if CONNECTION_REQUEST msg is pending for this service fd { 
read CONNECTION_REQUEST msg with proxy-assigned flow id; 



yi if (connection can be accepted) { 

si send ACCEPT_CONNECTION msg; 

|2 return (flow id) ; 



else { 

send RE JECT_CONNECTION msg; 



} 

else 

wait to receive CONNECTION_REQUEST msg; 



} // while loop 



} 



case transport fd: 

return (exception error) ; 

default: 

return ( accept (fd, clientaddr, len)); 




select () -> sf_select (nfds, readfds, writefds, exceptfds, timeout) { 
note the number of fds to select on; 

set timeslice as a function of timeout and number of fds; 

do forever { 

// PHASE 1: POLL ALL FDs 

for each service fd in readfds { 

if CONNECT ION_REQUE ST msg is pending for this service fd 
set corresponding service fd as available; 

} 

for each transport fd in readfds { 

if DATA msg is pending for this transport fd 
set corresponding transport fd as available; 

} 

for each mapped fd in readfds { 

perform mapping to transport fd; 

if DATA msg is pending for this transport fd 

set corresponding mapped fd as available; 

} 



for each transport fd in writefds { 

if DATA msg can be sent on this transport fd 
set corresponding transport fd as available; 

} 

jjjj for each mapped fd in writefds { 

perform mapping to transport fd; 
^ if DATA msg can be sent for this transport fd 

Hl 4 set corresponding mapped fd as available; 

m > 

|*Q for each service fd in exceptfds { 

j^j if exception occurs for this service fd 

set corresponding service fd; 

} 



i £ 



\Tl for each transport fd in exceptfds { 

if exception occurs for this transport fd 
^ set corresponding transport fd; 

u ] 

for each mapped fd in exceptfds { 
!*j 5 perform mapping to transport fd; 

if exception occurs for this transport fd 
set corresponding mapped fd; 

o > 

^ for al other fds 

call original system selector- 
combine all available descriptors; 

if (one or more descriptors are ready) 

return (number of descriptors available) ; 
else 

choose one descriptor in readfds to wait on; // heuristic-based choice 

restore original descriptor sets; 

if (time is up AND no fd is available) 
return (timed out); 

// PHASE 2: WAIT if necessary 

wait for arrival of CONNECTION_REQUEST, ACCEPT_CONNECTION , 

REJECT_CONNECTION or DATA msg for the chosen descriptor, up to timeslice; 
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recv() -> sf_recv (fd, buf, len, flags) { 

switch (type of fd) { 

case service fd: 

return {exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if (MSG_WAITALL flag is not set) { 

if at least one DATA msg is pending for this transport fd { 
receive data into buf; 
return (number of bytes read) ; 

} 

else { 

if (this is a non-blocking socket) 
return (resource not available) ; 
else { 

wait to receive a DATA msg for this transport fd; 

receive data into buf; 

return (number of bytes read) ; 

o ) 

*0 } 

% 5 else { 

.2* wait until all len bytes of DATA msgs for this transport fd arrives; 

receive data into buf; 
ftj return (number of bytes read) ; 



m 

Q 



} 



default: 

return ( recv (fd, buf, len) ) ; 

} 
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send() -> sf_send (fd, buf, len, flags) { 

switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if (this is a non-blocking socket) { 

if (no DATA msg can be sent at this time) 

return (try again) ; 
else 

send DATA msg(s) with data f rorrv buf in non-blocking fashion; 

} 

else { 

if ( no DATA msg can be sent at this time) 

Wait until atleast one DATA msg can be sent; 
send DATA msg(s) with data from buf; 

} 

return (number of bytes sent) ; 



2 default: 



return (send (fd, buf, len)); 
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read ( ) -> sf_read (fd, buf, len) { 

switch (type of fd) { 

case service fd: 

return {exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if at least one DATA msg is pending for this transport fd { 

receive data into buf; 

return (number of bytes read) ; 

} 

else { 

if (this is a non-blocking socket) 
return (resource not available) ; 
else { 

wait to receive a DATA msg for this transport fd; 

receive data into buf; 

return (number of bytes read) ; 

} 



Us default: 

IB return ( read (fd, buf, len)); 





write () -> sf_write (fd, buf, len) { 

switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 



if (this is a non-blocking socket) { 

if (no DATA msg can be sent at this time) 

return (try again) ; 
else 

send DATA msg(s) with data from buf in non-blocking fashion 



else { 

if ( no DATA msg can be sent at this time) 

Wait until atleast one DATA msg can be sent; 
send DATA msg(s) with data from buf; 



return (number of bytes written) ; 
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default: 



return (write (fd, buf, len)); 






readv() -> sf_readv (fd, vector__buf, vector_count) { 

switch (type of fd) { 

case service fd: 

return {exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if at least one DATA msg is pending for this transport fd { 
scatter data received into vector_buf; 
■ return (number of bytes read) ; 



else { 

if (this is a non-blocking socket) 
return (resource not available) ; 
else { 

wait to receive a DATA msg for this transport fd; 
scatter data received into vector_buf; 
return (number of bytes read) ; 



□ 



default: 



return ( readv (fd, buf, len) ) ; 
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writev() -> sf_writev (fd, vector_buf, vector_count) { 

switch (type of fd) { 

case service fd: 

return {exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 



if (this is a non-blocking socket) { 

if (no DATA msg can be sent at this time) 

return (try again) ; 
else 

send DATA msg(s) with gathered data from vector_buf; 



else { 

if ( no DATA msg can be sent at this time) 

Wait until atleast one DATA msg can be sent; 
send DATA msg(s) with gathered data from vector_buf; 



return (number of bytes written) ; 



default: 




return (writev (fd, buf, len) ) ; 






ioctl() -> sf_ioctl (fd, request, arg) { 

switch (type of fd) { 

case service fd: 

return (socket not connected error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

switch (request) { 



case FIONBIO: 

set non-blocking I/O variable to value in arg; 

return (success) ; 
case FIOASYNC: 

set async I/O variable to value in arg; 

return (success) ; 
case FIONREAD: 

peek at DATA msg for this transport fd; 

set number of bytes in arg; 

return (success) ; 
default: 

return (warning: option not meaningful in SAN Transport); 
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default: 



return (ioctl (fd, request, arg) ) ; 
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getsockname () -> sf_getsockname (fd, localaddr, addrlen) { 

switch (type of fd) { 

case service fd: 

return (socket not connected error) ; 

case mapped fd: 

perform mapping to transport • fd; 

case transport fd: 

return (local protocol address associated with this transport fd) 



default: 



return (getsockname (fd, localaddr, addrlen) ) ; 






getpeername () -> sf_getpeername (fd, localaddr, addrlen) { 

switch {type of fd) { 

case service fd: 

return (socket not connected error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if (information is available from the proxy node) 

return (foreign protocol address associated with this transport fd) ; 
else 

return (address not available) ; 



default: 



return (getpeername (fd, localaddr, addrlen) ) ; 
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getsockoptO sf_getsockopt (fd, level, optname, optval, optlen) { 

if (level == SOL_SOCKET) { 
switch (type of fd) { 

case service fd: 

return (warning: setsockoptO not meaningful for service fd) ; 
case mapped fd: 

perform mapping to transport fd; 



case transport fd: 

switch (optname) { 
case SO_RCVBUF: 
case SO_SNDBUF: 

if (buffering supported by proxy node) { 

get corresponding state variable and place value in optval; 
return (success); 

} 

else 

return (unable to get buffer sizes); 



case SO_LINGER: 
case SO_RCVLOWAT: 
case SO_SNDLOWAT: 

get corresponding state variable and place value in optval; 

return (success); 
i*j case SO_TYPE: 

^ return (SOCK_STREAM) ; 

"0 default: 

■~j return (warning: option not meaningful in SAN Transport); 

jT 4 ^ 



B default: 

return { getsockopt ( f d, level, optname, optval, optlen) ); 

} 



iil > 



if (level == IPPR0T0_TCP) { 
f^L switch (type of fd) { 

3 - 

;U case service fd: 



□ 



return (warning: setsockoptO not meaningful for service fd) ; 
case mapped fd: 

perform mapping to transport fd; 
s& case transport fd: 

switch (optname) { 
case TCP_MAXSEG: 

get segment size of SAN transport and place value in optval; 
return ( success ) ; 
case TCP_NODELAY : 

if (no-delay option is known) { 
get value and place in optval; 
return (success) ; 

} 

else 

return (error) ; 



default: 

return (warning: option not meaningful in SAN Transport); 



default: 

return ( getsockopt ( f d, level, optname, optval, optlen) ); 

} 

} 

return (not implemented) ; 

} 



setsockoptO -> sf_setsockopt (fd, level, optname, optval , optlen) { 

if (level SOL_SOCKET) { 
switch (type of fd) { 
case service fd: 

return (warning: setsockoptO not meaningful for service fd) ; 
case mapped fd: 

perform mapping. to transport fd; 
case transport fd: 
switch (optname) { 
case SO_RCVBUF: 
case SO_SNDBUF: 

^ if (buffering supported by proxy node) { 

set corresponding state variable to value given by optval; 
communicate buffer size given by optval to proxy node; 
if (communication successful) 

return (success) ; 
else 

return (unable to set buffer size) ; 

} 

else 

return (unable to set buffer sizes); 

case SO_LINGER: 
case SO_RCVLOWAT : 
case SO_SNDLOWAT : 

set corresponding state variable to value given by optval; 
communicate optname and optval to proxy node; 
if (communication successful) 
'z** return (success) ; i — - ^ f 

H else KiG bQ 

sft return (unable to set option) ; 

default : 

return (warning: option not meaningful in SAN Transport); 

y default: 

111 return ( setsockopt { f d, level, optname, optval, optlen) ); 

} 



if (level == IPPROTOJTCP) { 
switch (type of fd) { 
case service fd: 

return (warning: setsockopt () not meaningful for service fd) ; 
case mapped fd: 

perform mapping to transport fd; 
case transport fd: 
switch (optname) { 
case TCP_MAXSEG: 

set segment size of SAN transport to value given by optval; 
return (success) ; 
case TCP_NODELAY: 

set no-delay variable to value given by optval; 
communicate optname and optval to the proxy node; 
if ('communication successful) 

return ( success ) ; 
else 

return (unable to set no-delay option) ; 
default: 

return (warning: option not meaningful in SAN Transport); 



default: 

return ( setsockopt ( fd, level, optname, optval, optlen) ); 

} 

} 

return (not implemented) ; 



} 
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close () -> sf_close (fd) { 

switch (type of fd) { 

case service fd: 

send LEAVE_SERVICE msg on service fd; 

clean up transport resources associated with this service; 
return (close (fd) ) ; 

case mapped fd: 

perform mapping to transport fd; 

send CLOSE_CONNECTION msg on transport fd; 

reset fd mapping; 
return (close (fd) ) ; 

case transport fd: 

send CLOSE CONNECTION msg on transport fd; 



default: 

return (close ( fd) ) ; 



111 
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shutdown () -> sf_shutdown (fd, howto) { 

if (howto == SHUT_RD) { 

if (fd already closed for writes) 
set full__shutdown_f lag to TRUE; 
else 

note that fd is closed for further reads; 

} 

if (howto == SHUT_WR) { 

if .(fd already closed for reads) 

set full_shutdown_f lag to TRUE; 
else 

note that fd is closed for further writes; 



if (howto == SHUT_RDWR) { 

set full_shutdown__f lag to TRUE; 



if (full_shutdown_flag — TRUE) { 

switch (type of fd) { 
case service fd: 

send LEAVE_SERVICE msg on service fd; 

clean up transport resources associated with this service; 



jfj breaks- 



case mapped fd: 

perform mapping to transport fd; 
Si send CLOSE_CONNECTION msg on transport fd; 

\J\ reset fd mappings- 

break; 

3: 

case transport fd: 
3^ send CLOSE_CONNECTION msg on transport fd; 

breaks- 



default: 

return ( shutdown (fd, hotwo) ) 



return ( shutdown (fd, howto) ) ; 



